import json



with open('C:\JaredLyu\Project\MiniMind\data\pretrain_hq.jsonl', 'r', encoding='utf-8') as f:
    data = [json.loads(line.strip()) for line in f]

print(f"数据集大小: {len(data)}")
# 打印前5条数据
for i in range(5):
    print(f"数据条目 {i + 1}: {data[i]}")